from langchain.document_loaders import UnstructuredHTMLLoader, BSHTMLLoader


def normal_html_loader():
    loader = UnstructuredHTMLLoader("files/fake-content.html")
    data = loader.load()
    print(data)


def html_loader_with_beautiful_soup4():
    loader = BSHTMLLoader("files/fake-content.html")
    data = loader.load()
    print(data)


if __name__ == '__main__':
    html_loader_with_beautiful_soup4()